import pandas as pd
data = pd.read_csv('上海餐饮数据.csv',
                   encoding='utf8')
print(len(data))
print(data)
# data = pd.read_csv('上海餐饮数据.csv',
#                    index_col=1, encoding='utf8')
# print(data.size, len(data))
# print(data)
dishes = data['类别'].drop_duplicates()
print(dishes)
print('去重之后的所有菜品总数为：', len(dishes))
print(len(data))

data.drop_duplicates(inplace=True)
print('去重之后的所有记录个数为：', len(data))
